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AE015074 10085 bp DNA linear BCT 18-0CT-2002 

Shigella flexneri 2a str. 301 section 37 of 412 of the complete 
genome. 

AE015074 AE005674 
AE015074. 1 

Shigel la f lexner 1 2a str. 301 
Shigel la f lexneri 2a s tr. 301 

Bacteria; Proteobacter la ; Gainnaproteobacteria; Enterobacter i a I as ; 
Enterobacter iaceae ; Shigella. 

1 (bases 1 to 10085) 

Jin.Q., Yuan.Z.H., Xu.J.G., Wang.Y., Shen.Y., Lu.W.C, WangJ-H., 
Liu.H., Yang, J., Yang.F., Qu.D., Zhang, X.B., Zhang.J.Y., Yang.G.W., 
Wu.H. T., Dong, J., Sun, L. L. , Xue.Y. , Zhao, A. L., Gao, Y. S. , Zhu, J.P., 
Kan,B., Chen.S.X., Yao.Z.J., He.B.K., Chen, R. S. , Ma.D.L., 
Qiang,B.Q., Wen,Y.M., Hou,Y.D. and Yu, J. 
Genome sequence of Shigella f lexneri 2a: insights into 
pathogenicity through comparison with genomes of Escherichia col i 
K12 and 0157 

Nucleic Acids Res. 30 (20), 4432-4441 (2002) 
12384590 

2 (bases 1 to 10085) 

Jin.Q., Shen,Y., Wang,J.H., Liu,H., Yang, J., Yang,F., Zhang, X.B., 
Zhang.J.Y., Yang.G.W., Wu,H.T., Dong.J., Sun,L.L., Xue,Y., 
Zhao, A. L., Gao.Y.S., Zhu, J. P.. Chen.S.X., Yao.Z.J., Wang,Y., 
Lu.W.C, Qiang.B.Q., Wen.Y.M. and Hou.Y.D. 
Direct Submission 

Submitted (08-MAY-2001) Microbial Genome Center of Chinese Ministry 
of Public Health, 100 YingXin Jie, XuanWu Qu, Beijing 100052, P. R. 
China 

Locat ion/Qual if iers 
1. . 10085 

/organi sm=" Shigel! a flexneri 2a str. 301" 

/strain=''30r 

/serotype=" 2a" 

/db_xref=" taxon:198214" 

91.. 795 

/gene-' adk" 

/note=" SF0419" 

91.. 795 

/gene=" adk" 

/note="Residues 2 to 234 of 234 are 98 pet identical to 

residues 1 to 233 of a 233 aa protein from Escherichia 

col i gb: AAB40228. 1" 

/codon_start=l 

/transl_table=11 

/product=" adeny I ate kinase" 

/protein_id="AAN42074. 1" 

/db_xref="GI:24050653" 

/ 1 rans I a t i 0 n=" MVVSF i AFSKKSTHFKG I FAMR 1 1 LLGAPGAGKGTQAQF I MEKY 

G I PQ I STGDMLRAAVKSGSELGKQAKD I MDAGKLVTDELV I ALVKER I AQEDCRNGFL 

LDGFPRTI PQADAMKEAG I NVDYVLEFOVPDEL I VDR I VGRR VHAPSGR VYHVKFNPP 

KVEGKDDVTGEELTTRKDDQEETVRKRLVEYHQMTAPL I GYYSKEAEAGNTKYAKVDG 

TKQVAEVRADLEKILG" 

927. .1889 

/gene=" hemH" 

/note="SF0420" 

927. . 1889 

/gene=" heraH" 

/note="Residues 1 to 320 of 320 are 98 pet identical to 
residues 1 to 320 of a 320 aa protein from Escherichia 
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coli 0157:H7 EDL933 ref: NP_2862?6. 1" 

/codon_start=1 

/transl_table=ll 

/product="ferrochelatase: final enzyme of heme 
btosynt hes i s" 
/protein_id="AAN42075. 1" 
/db_xref=''GI:24050654'' 

/t rans I at ion="MRQTKTG I LLAfJLGTPDAPTPEAVKRYLKQFLSDRRVVDTSRLL 
WWPLLRGVILPLRSPRVAKLYASVWMEDGSPLMVYSRQQQQALAQRLPDTPVALGMSY 
GSPSLESS VDELLAEHVDH I VVLPLYPQFSCSTVGAVWDELAR I LARKRS I PG I SF I R 
DYADNHDY I NALANSVRASFAKHGEPDLLLLS YHG I PQRYADEGDDYPQRCRTTTREL 
ASALGHVPEKVMMTFQSRFGREPWLMPYTDETLKMLGEKGVGHiqVMCPGFAADCLET 
LEE I AEQNRE VFLGAGGKK YEY I PALNATPEH I EMMANLVAAYR" 

gene complement (2027. . 2845) 

/gene=" aes" 
/note="SF0421'' 

CDS comp lenient (2027. .2845) 

/gene=" aes" 
/EC_number='' 3. 1.1. -" 

/note="Resldues 1 to 272 of 272 are 98 pet identical to 

residues 1 to 272 of a 319 aa protein from Escherichia 

coli K12 ref: NP_415009.r 

/codon_start=l 

/transl_table=n 

/product=" putat i ve lipase" 

/protein_id="AAN42076. 1" 

/db_xref="GI : 24050655" 

/ 1 rans I a t i on=" MKPENKLPVLDL 1 SAEMKTVVNTLQPDLFSWPATGT I AEQRQYY 
TLERRFWNAGAPEMATRAYMVPTKYGQVETRLFCPQPDSPATLFYLHGGGF I LGNLDT 
HDR I MRLLASYSQCTV I G I NYTLSPEARFPQA I EE I VAACCYFHQQAEDYQ I NHSR I G 
FAGDSAGAMLALASALWLRDKQ I DCGK I AGVLLWYGLYGLRDS VTRRLLGGVWDGLTQ 
QDLQMYEEAYLSNDADRESPYYCLFNNDLTREVPPCF I AGAEFDPLLDDSRLLY" 

g_en_e 2997.. 4301 

/gene="gsk" 
/note="SF0422" 

CDS 2997.. 4301 

/gene=" gsk" 

/note="Residues 1 to 434 of 434 are 99 pet identical to 

residues 1 to 434 of a 434 aa protein from Escherichia 

coli 0157:H7 EDL933 ref: NP_286218. 1" 

/codon_start=1 

/transl_table=11 

/product=" inosine-guanosine kinase" 
/proteln_id=" AAN42077. 1" 
/db_xref="GI: 24050656" 

/translation="MKFPGKRKSKHYFPVNARDPLLQQFQPENETSAAWVVGIDQTLV 
D I EAKVDDEF I ERYGLSAGHSLV I EDDVAEVLYQELKQKNL I THQFAGGT I GNTMHNY 
S VLADDRSVLLGVMCSN I E I GSYAYRYLCNTSSRTDLNYLQGVDGP I GRCFTL IGESG 
ERTFA I SPGHHNQLRAES I PEDV I AGASALVLTSYLVRCKP6EPMPEATHKA lEYAKK 
YNVPVVLTLGTKFV I AENPQWWQQFLKDHVS I LAMKEDEAEALTGESDPLLASDKALD 
WVELVLCTAGPIGLYMAGFTEDEAKRKTQHPLLPGAIAEFNQYEFSRAMRHKDCQNPL 
RVYSH I APYMGGPEK I MNTNGAGDGALAALLHD I TANSYHRSNVPNSSKHKFTWLTYS 
SLAQVCKYANRVSYQVLNQHSPRLTRGLPEREDSQEESYIVDR" 

.gene ccmpi ement (4434. .61 10) 

/gene=" ybaL" 
/note="SF0423" 

CDS complement (4434. .61 10) 

/gene=" ybaL" 

/note=" Residues 1 to 558 of 558 are 99 pet identical to 

residues 1 to 558 of a 558 aa protein from Escherichia 

coli 0157:H7 EDL933 ref: NP_286219. 1" 

/codon_start=1 

/transl_table=11 

/product="putat ive transport protein" 
/protein_id="AAN42078, 1" 
/db_xref="GI :24050657" 

/t r ans I a t i on=" MHHATPL I TT 1 VGGLVLAF I LGMLANKLR I SPLVGYLLAGVLAG 
PFTPGFVADTKLAPELAELGV I LLMFGVGLHFSLKDLMAVKS I A I PGA I AQ I AVATLL 
GMALSAVLGWSLMTG I VFGLCLSTASTVVLLRALEERQL I DSQRGQ I A I GWL I VEDLV 
MVLTLVLLPAVAGMMEQGDVGFATLAVDMG I T I GKV I AF I A I MMLVGRRLVPW I MARS 
AATGSRELFTLSVLALALG I AFGAVELFDVSFALGAFFAGMVLNESELSHRAAHDTLP 
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LRDAFAVLFFVSVGMLFDPL I L IQQPLAVLATLA 1 1 LFGKSVAALFLVRLFGHSQRTA 
LT 1 AASLAQ I GEFAF I LAGLGMALNLLPQAGQNLVLAGA I LS I MLNPVLFALLEKYLA 
KTETLEEQTLEEA I EEEKQ I PVD I CNHALLVGYGRVGSLLGEKLLASD I PLVV 1 ETSR 
TRVDELRERGVRAVLGNAANEE I MQLAHLECAKWL 1 LT I PNGYEAGE I VASARAKNPD 
I E 1 1 ARAHYDDE VTY I TERGANQVVMGERE I ARTMLELLETPPAGEVVTG" 

gene compi ement (6348. . 7568) 

/gene=" fsr" 
/note="SF0424" 

CDS complement (6348.. 7568) 

/gene=" fsr" 

/note=" Res i dues I to 406 of 406 are 99 pet identical to 

residues 1 to 406 of a 406 aa protein from Escherichia 

coll 0157:H7 EDL933 ref: NP_286220. 1" 

/codon_start=l 

/transl_table=11 

/product="fosmidomycin resistance protein" 
/protein_id="AAN42079. 1" 
/db_xre.f="GI : 24050658" 

/t rans I at i on=" MAMSEQTQPVAGAAASTTKARTSFG I LGAI SLSHLLNDMI QSL I 
LAIYPLLQSEFSLTFMQlGMiTLTFQLASSLLQPVVGYWTDKYPMPWSLPIGMCFTLS 
GLVLLALAGSFGAVLLAAALVGTGSS VFHPESSRVARMASGGRHGLAQS I FQVGGNFG 
SSLGPLLAAV II APYGKGNVAWFVLAALLA I VVLAQ I SRWYSAQHRMNKGKPKAT 1 1 N 
PLPRNKVVLAVS I LL I L I FSKYFYMAS I S SYYTFYLMQKFGLS I QNAQLHLFAFLFAV 
AAGTV I GCPVCDK I GRKYV I WGS I LGVAPFTL I LPYARLHWTGVLTV 1 1 GF I LASAFS 
A I LVYAQELLPGR I GMVSGLFFGFAFGMGGLGAAVLGLI ADHTS I ELVYK I CAFLPLL 
GMLTIFLPDNRHKD" 
gene 7786. . 9438 

/note="SF0425" 
CDS 7786.. 9438 

/gene=" us hA" 

/note="Residues 1 to 550 of 550 are 99 pet identical to 

residues 1 to 550 of a 550 aa protein from Escherichia 

coli KI2 ref: NP_415013. 1° 

/codon_start=1 

/transl_table=11 

/product="UDP-sugar hydrolase (5' -nuc I eot i dase)" 
/protein_id=°AAN42080. ?" 
/db xref="GI :24050659" 

/ 1 r ans I a t i 0 n=" MKLLQRGVALALLTTFTLASETALAYEQDKTYK I TVLHTNDHHG 
HFWRNEYGEYGLAAQKTLVDG I RKEVAAEGGSVLLLSGGD I NTGVPESDLQDAEPDFR 
GMNLVGYDAMA I GNHEFDNPLTVLRQQEKWAKFPLLSAN I YQKSTGERLFKPWALFKR 
QDLKIAVIGLTTDDTAKIGNLEYFTDIEFRKPADEAKLVIQELQQTEKPDI I lAATHM 
GHYDNGEHGSNAPGDVEMARALPAGSLAM I VGGHSQDPVCMAAENKKQVDYVPGTPCK 
PDQQNG I W I VQAHEWGK YVGRADFEFRMGEMKMVN YQL I P VNLKKKVTWEDGKSERVL 
YTPE I AENQQM I SLLSPFQNKGKAQLE VK I GKTNGRLEGDRDKVRFVQTNMGRL I lAA 
QHDRTGADFAVMSGGG I RDS I EAGD 1 SYKNVLKVQPFGNVVVYADMTGKEV I DYLTAV 
AQMKPDSGAYPQFANVSFVAKDGKLNDLK I KGEPVDPAKTYRMATLNFNATGGDGYPR 
LDNKPGYVNTGFIDAEVLKAYIQKSSPLDVSVYEPKGEVSWQ" 

gene complement (9475. . 9954) 

/gene=" ybaK" 
/note="SF0426" 

CDS compI ement (9475. . 9954) 

/gene=" ybaK" 

/note=" Res i dues 1 to 159 of 159 are 100 pet identical to 

residues 1 to 159 of a 159 aa protein from Escherichia 

coli K12 ref: NP_415014. 1" 

/codon_start=1 

/transl_table=11 

/product="orf , conserved hypothetical protein" 
/protein_id="AAN42081. 1" 
/db_xref="GI : 24050660" 

/trans I a t i on="MTPAVKLLEKNK 1 SFQ I HTYEHDPAETNFGDEVVKKLGLNPDQV 
YKTLLVAVNGDMKHLAVAVTPVAGQLDLKKVAKALGAKKVEMADPHVAQRSTGYLVGG 
I SPLGQKKRLPT 1 1 DAPAQEFAT I YVSGGKRGLD I ELAAGOLAK I LDAKFAD I ARRD" 

BASE COUNT 2628 a 2586 c 2607 g 2264 t 

ORIGIN 

1 gcatttttct tttcatcatc tgtactttcc gcaaattatc tcgccattaa ccgtttcagc 
61 ctcaggtgcc tttcttgagg caatcgcctg ttggtggtat cgtttatcgc tttttcaaaa 
121 aaatcgacac attttaaggg gattttcgca atgcgtatca ttctgcttgg cgctccgggc 
181 gcggggaaag ggactcaggc tcagttcatc atggagaaat atggtattcc gcaaatctcc 
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241 actggcgata tgctgcgtgc tgcggtcaaa 

301 gacattatgg atgctggcaa actggtcacc 

361 cgcattgctc aggaagactg ccgtaatggt 

421 ccgcaggcag acgcgatgaa agaagcgggc 

481 gtaccggacg aactgattgt tgatcgtatc 

541 cgtgtttatc acgttaaatt caatccgccg 

601 gaagaactga ctacccgtaa agacgatcag 

661 taccatcaga tgactgcacc gctgatcggc 

721 accaaatacg cgaaagttga cggtaccaag 

781 aaaatcctcg gctaatcaag ccgcagcaga 

841 tcaggcaata cctctcacag caattagttc 

901 acaagttgaa tcgataagag gcggtaatgc 

961 acctgggtac gcccgatgcc cccacacctg 

1021 taagcgacag acgcgtggtt gatacctcac 

1081 tgattttgcc gctgcgctcg ccgcgtgtgg 

1141 acggctcgcc gctgatggtt tacagccgcc 

1201 cggatacgcc agtggcgctg ggcatgagct 

1261 atgaactcct ggcagagcat gtagatcata 

1321 cctgttctac ggtcggtgcg gtatgggatg 

1381 gcattccggg gatatcgttt attcgtgatt 

1441 tggcgaacag cgtacgcgct tcttttgcca 

1501 cttatcatgg cattccccag cgttatgcag 

1561 gcacaacgac tcgcgaactg gcttccgcac 

1621 cctttcagtc gcgctttggc cgggaaccct 

1681 aaatgctcgg agaaaaaggc gtaggtcata 

1741 attgtctgga gacgctggaa gagattgccg 

1801 gcgggaaaaa atatgaatat attccagcgc 

1861 tggctaatct tgttgccgcg tatcgctaaa 

1921 gaagagcctc gtcggcggtt ttcatcatcc 

1981 ctgggtagag tttgaactca cagggctgct 

2041 ggctgtcatc cagcagcgga tcgaactccg 

2101 gagtgagatc attattaaac agacagtaat 

2161 aatacgcctc ttcatacatc tgcaaatcct 

2221 acagacgacg agtcacggaa tcccgtaatc 

2281 caattttacc gcaatcgatc tgtttatcac 

2341 tggcacctgc ggaatcaccg gcaaagccaa 

2401 cctgctggtg gaaataacaa caagcagcca 

2461 cttcaggtga aagggtgtaa ttaataccaa 

2521 ggcgcatgat gcgatcgtgg gtatcgagat 

2581 aaaatagcgt cgccgggcta tctggctgcg 

2641 attttgttgg aaccatgtaa gctctggttg 

2701 ggcgctcaag cgtgtaatac tgtcgttgct 

2761 gtaaatccgg ctgaagagta ttcacaacgg 

2821 caggtagttt gttttccggc ttcatacaaa 

2881 accactgcca tgaaaatgcg atcccgcctg 

2941 ctcccgtcag attgtgttaa cattcgccgc 

3001 aatttcccgg taaacgtaaa tccaaacatt 

3061 ttcagcaatt ccagccagaa aacgaaacca 

3121 cgctggtcga tattgaagcg aaagtggatg 

3181 ccgggcattc actggtgatt gaggatgacg 

3241 agaaaaacct gattacccat cagtttgcgg 

3301 actcggtgct cgcggacgac cgttcggtgc 

3361 ttggcagtta tgcctatcgt tacctgtgta 

3421 tacaaggcgt ggatggtccg attggtcgtt 

3481 gtacctttgc tatcagtcca ggccacatga 

3541 atgtgattgc cggagcctcg gcactggttc 

3601 gtgaacccat gccggaagca accatgaaag 

3661 cggtggtgct eacgctgggc accaagtttg 

3721 aattcctcaa agaccacgtt tctatccttg 

3781 ccggagaaag cgatccgttg ttggcatctg 

3841 tgtgcaccgc cgggccaatc ggcttgtata 

3901 gtaaaaccca gcatccgctg ctgccgggcg 

3961 gccgcgccat gcgccacaag gattgccaga 

4021 cgtacatggg cgggccggaa aaaatcatga 

4081 cagcgttgct gcatgacatt accgccaaca 

4141 gcaaacataa attcacctgg ttaacttatt 

4201 accgtgtgag ctatcaggta ctgaaccagc 

4261 agcgtgaaga cagccaggaa gagtcttact 

4321 ccagataagg cgttcacgcc gcatctggca 

4381 cgcgtcttat catgcctaca tatttttcat 

4441 gtcaccactt cacccgccgg tggcgtttcc 



tctggctccg agctgggtaa acaagcaaaa 
gacgaactgg tgatcgcgct ggttaaagag 
ttcctgttgg acggcttccc gcgtaccatt 
atcaatgttg attacgttct ggaattcgac 
gtaggccgcc gcgttcatgc gccgtctggt 
aaagtagaag gcaaagacga cgttaccggt 
gaagaaaccg tgcgtaaacg tctggtlgaa 
tactactcca aagaagcgga agcgggtaac 
caggttgctg aagttcgcgc tgatctggaa 
tctgctttcg ggcaggtctg cttatccacc 
ttcttcctca cttttccgct acaattatca 
gtcagactaa aaccggtatc ctgctggcaa 
aagcggtaaa acgctatctg aaacaatttt 
ggttgttatg gtggccgttg ctgcgcggcg 
cgaagctgta cgcctctgtc tggatggaag 
agcaacagca ggcgttggca caacgtttac 
acggctcgcc atcactggaa agctccgtcg 
ttgtggtgct gccgctttat ccgcaattct 
aactggcacg cattctggcg cgcaaacgta 
acgccgataa ccacgattac attaatgcac 
aacatggcga accggatctg ctgctgctct 
atgaaggcga tgattacccg caacgttgcc 
tggggatggt accggaaaaa gtgatgatga 
ggctgatgcc ttataccgac gaaacgctga 
tacaggtgat gtgcccgggc tttgctgcgg 
agcaaaaccg tgaggtcttc ctcggtgcgg 
ttaatgccac gccggaacat atcgaaatga 
gctgagcggt aaagaactga gcgccgtcgc 
gtgaataatg caaaaaggca tgcagcgtac 
gatgcgccgc taacgtctag taaagcagac 
ccccggcaat aaaacagggc ggaacttcgc 
acggtgactc gcggtccgcg tcgttgctta 
gttgcgttaa gccatcccag acaccgccca 
cgtaaagccc ataccacagc aaaacacccg 
gcaaccacaa cgcactggcg agcgccagca 
tgcgggacat attgatttga taatcctccg 
caatttcctc tatcgcttgt ggaaaacgcg 
tcaccgtaca ttggctgtag cttgccagca 
tgccgagaat aaaaccgcct ccatgcaaat 
gacaaaagag acgtgtttcc acctgcccat 
ccatttctgg agcgcccgca ttccagaatc 
cagcaatcgt tcccgttgcg ggccaggacg 
tcttcatttc agcagaaata aggtccagaa 
aactcctttc aaattacgtc attgtaagga 
ctgatattga aactggctgc gtctcgcgcg 
tcagttaacc acccgtaaaa acaaccatga 
acttccctgt aaatgcacgc gatccgctgc 
gcgccgcctg ggtcgtaggt attgaccaga 
atgaattcat tgagcgttat ggattaagcg 
tagccgaagt gctttatcag gagctaaaac 
gtggcaccat tggtaacacc atgcacaact 
tgctgggcgt catgtgcagc aatattgaaa 
acacttccag ccgtaccgat cttaactatc 
gctttacgct gattggcgag tccggggaac 
accagctgcg ggctgaaagc attccggaag 
tcacctcata tctggtgcgt tgcaagccgg 
ccattgagta cgcgaagaaa tataacgtac 
tcattgccga gaatccgcag tggtggcagc 
cgatgaacga agatgaagcc gaagcgttga 
acaaggcgct ggactgggta gagctggtgc 
tggcgggctt iaccgaagac gaagcgaaac 
ctatagcgga attcaaccag tatgagttta 
atccgctgcg tgtctattcg cacattgcgc 
acactaatgg agcgggggat ggcgcattgg 
gctaccatcg tagcaacgta ccaaactcca 
catcgttagc gcaggtgtgt aaatatgcta 
attcacctcg tttaacgcgc ggcttgccgg 
gggatcgtta agttatcgtc ggttcgtagg 
tttggctctc gatgcctgat gcgacgctgg 
attttacatc cggcaaccac cgtttacccc 
agcagttcca gcatagtacg ggcaatttca 
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4501 cgttcaccca tcactacctg attcgcgcca 

4561 taatgggcgc gggcgataat ctcaatatcc 

4621 tcacccgctt cataaccgtt ggggatcgtc 

4681 gccagttgca taatttcttc gttcgctgca 

4741 cgcagctcat caacacgggt tcgtgacgtc 

4801 agcaatttct cccccagcag gctgcctaca 

4861 caaatatcca ctgggatctg tttctcttct 

4921 agcgtttcgg tcttcgccag atatttctcc 

4981 atcgacagga tcgcccctgc cagtaccagg 

5041 gccattccca gtcccgccag gataaacgcg 

5101 atggttaatg ccgtacgttg ggagtgacca 

5161 gatttaccaa acagaataat tgccagcgtc 

5221 attaacggat caaacaacat cccgactgag 

5281 aatggcaacg tatcgtgggc ggcacggtga 

5341 gcaaagaacg caccgagtgc aaaggagaca 

5401 cctaacgcca gcgccagcac tgacagggta 

5461 cgtgccataa tccacggcac cagacggcga 

5521 atcaccttgc cgatgglgat ccccatatcg 

5581 tgttccatca ttcctgccac tgcgggcagc 

5641 tccacaatca accaaccgat ggcgatttgc 

5701 tcaagtgcgc gcagtaacac cacggtactg 

5761 ccggtcatta acgaccagcc cagcacggcg 

5821 gctatctggg cgatcgcgcc gggaatggcg 

5881 gaaaaatgca aaccgacgcc gaacatcagc 

5941 gcaagcttgg tatcggcaac aaagcccgga 

6001 agatatccca ccagaggaga aatacgtagt 

6061 agcacaaggc cgccaacaat ggtggtgata 

6121 tttcctggtg gttattgtcc attttgggct 

6181 tgacaatttc attgatgatg tttatgaata 

6241 gctgcaaaaa aagcacggtt cggaaaacag 

6301 cgactgtaaa acgatgcagc caaagtttgc 

6361 cggttatcag gcaggaatat ggtcaacatc 

6421 tagactaact cgatgctggt gtgatcggcg 

6481 cccatgccga aagcaaaacc gaaaaagagt 

6541 agctcctgag cgtagaccag aatggcagag 

6601 accgttaaaa cccccgtcca gtgcaggcgg 

6661 acgccgagga tagagcccca aatcacatat 

6721 ccgatcaccg tacctgccgc aacggcaaac 

6781 tggatagata atccgaattt ttgcatcaga 

6841 atatagaaat atttcgagaa aatgaggatt 

6901 ttgcgcggca gtggattgat tatcgtcgct 

6961 gccgagtacc aacggctaat ttgcgccaac 

7021 aaccaggcaa cgttgccttt gccataaggc 

7081 agggaactgc caaagttgcc gccgacctga 

7141 ccggaagcca tacgggctac gcgagaagat 

7201 accagcgccg ctgccagcag aactgcgcca 

7261 ccacttaagg taaagcacat gccaattggc 

7321 cagtagccga ccactggttg cagtagcgaa 

7381 ccaatctgca taaatgtcag agaaaattct 

7441 agcgattgga tcatgtcgtt cagcagatgt 

7501 gatgttcggg ccttggtcgt tgacgcagcc 

7561 attgccatag gaaagtcact ttttcagggt 

7621 tattacccga ctaacatacc tgtatgcgtc 

7681 aatttctaat ctggatgcag atttatcttc 

7741 tcatactatt tttcaacacg ttgaaatcag 

7801 cggggcgtgg cgttagcgct gttaaccaca 

7861 tatgagcagg ataaaaccta caaaattaca 

7921 ttttggcgca atgaatatgg cgaatatggt 

7981 atccgcaaag aggttgcggc tgaaggcggt 

8041 aacactggcg tgcccgagtc tgacttacag 

8101 ctggtgggct atgacgcgat ggcgatcggt 

8161 ttacgccagc aggaaaagtg ggccaagttc 

8221 agtactggcg agcgcctgtt taaaccgtgg 

8281 gccgttattg ggctgacaac cgatgacaca 

8341 gatatcgaat ttcgtaagcc cgccgatgaa 

8401 acagaaaagc cagacattat tatcgcggcg 

8461 cacggctcta acgcaccggg cgatgtggag 

8521 gcgatgatcg tcggtggtca ctcgcaagat 

8581 caggtcgatt acgtgccggg tacgccatgc 

8641 gtgcaggcgc atgagtgggg caaatacgtg 

8701 gaaatgaaaa tggttaacta ccagctgatt 



cgttcggtga tatacgtcac ttcatcgtca 
gggtttttcg cgcgggcaga cgccacaatc 
aggatcagcc attttgcaca ttccagatgt 
ttgcccaata cagcgcggac cccacgctct 
tcaatcacca ccagcggaat atcagaggcg 
cgaccgtaac ccaccaatag cgcatggttg 
tcgattgcct cttccagcgt ctgctcttcc 
agtagtgcga acagtaccgg gttgagcata 
ttttgtccgg cctgcggcag taaattcaat 
aactcaccaa tctgcgccag gctggcggcg 
aacagacgga caaggaacag ggccgcgacc 
gccagcactg ccagcggttg ctgaatcaga 
acaaaaaaca gcaccgcaaa cgcgtcgcgc 
ctcaattcag actcgttcag taccatcccg 
tcaaacagct ctaccgcacc aaaggcaatc 
aacagctcgc gagaaccggt tgccgcgctg 
cctaccagca tcataatggc gataaatgcg 
actgcaagag tggcaaagcc cacatcgccc 
aacaccagcg tcagaaccat caccaggtct 
ccacgctgac tgtctattaa ttgccgttct 
gcggtggaaa gacataagcc gaacacgata 
gagagcgcca tacccagcag cgtcgccacg 
atggacttta ccgccatcaa atccttgagc 
aaaataacgc ccagttcagc cagttccggc 
gtgaatggtc ctgccagcac acccgctaac 
ttattggcca gcatgccgag gataaaggcg 
agcggggtgg cgtgatgcat tccgtctcct 
gggaaaacca aaattacagg taatagttta 
attgttgaat tttgcagaaa aatggaatta 
aaggcggttt aacagaggaa aggcttatgg 
ctttggctgc aatgaaatca gtctttatgc 
cccaatagtg gcaggaaagc acagatttta 
ataagcccca gaactgccgc tcccagacct 
ccagaaacca taccgatacg tcccggaagt 
aatgccgaag cgaggataaa tccaataatc 
gcgtagggta aaatcagcgt aaacggcgca 
ttccgtccaa ttttatcccc tacaggcccg 
aggaaggcaa acagatgaag ctgggcattc 
taaaaggtgt aatagctgct gatgctcgcc 
aacagaatgc tgactgccag taccactttg 
ttgggttttc ctttattcat tcggtgctgt 
accacgatcg ccagcagtgc cgcaagcaca 
gcgataatca ccgccgccag caagggtccc 
aagatagatt gcgccaggcc atgccgcccg 
tccggatgaa agaccgatga accggtaccg 
aaactgcccg ccagcgcaag cagcaccaga 
aacgaccacg gcatcggata tttatcggtc 
gaggcgagct ggaaggtgag ggttatcatg 
gactgaagca gcggataaat cgccagaatc 
gagaggctga tagcacctaa aataccaaac 
gcgcccgcca caggctgggt ttgttcactc 
tgcgatgtaa agaatgatct tatttgtgat 
gtctgaagga agtctcaacg ccgaatacag 
accggacgca gacttgtcta tgatgttgcg 
gtcagggaga gaagtatgaa attattgcag 
tttacactgg cgagtgaaac tgctctggcg 
gttctgcata ccaatgatca tcatgggcat 
ctggcggcgc aaaaaacgct ggtggatggt 
agcgtgctgc tactttccgg tggcgacatt 
gatgccgaac ctgattttcg cggtatgaat 
aatcatgaat ttgataatcc gctcaccgta 
ccgttgcttt ccgcgaatat ctaccagaaa 
gcgctgttta agcgtcagga tctgaaaatt 
gcaaaaattg gtaacctgga atacttcact 
gcgaagctgg tgattcagga gctgcaacag 
acccatatgg ggcattacga taatggtgag 
atggcacgcg cgctgcctgc cggatcgctg 
ccggtctgca tggcggcaga aaacaaaaaa 
aaaccagatc aacaaaacgg catctggatt 
ggacgggctg attttgagtt tcgtaatggc 
ccggtgaacc tgaagaagaa agtgacctgg 
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6/6 



8761 
8821 
8881 
8941 
9001 
9061 
9121 
9181 
9241 
9301 
9361 
9421 
9481 
9541 
9601 
9661 
9721 
9781 
9841 
9901 
9961 
10021 
10081 



// 



gaagacggga 
atctcgctgt 
aaaaccaatg 
gggcggttga 
ggaggcggaa 
gtgcagccat 
tacctgaccg 
gttagctttg 
gatccggcga 
tatccgcgcc 
ctgaaagcgt 
gaggtgagct 
gcggcgggcg 
ttcgatatcc 
ggcgtcgata 
gtatcccgtc 
cgcttttgct 
gtgtttcata 
acctaatttt 
atggatttga 
tttcctgcct 
agtcatcttg 
gtcgc 



aaagcgagcg 
tatcaccgtt 
gtcgtctgga 
ttctggcagc 
ttcgtgattc 
tcggcaatgt 
ccgtcgcgca 
tggcgaaaga 
aaacttaccg 
ttgataacaa 
atatccagaa 
ggcagtaatc 
atatcagcaa 
agtccgcgct 
atcgttggca 
gaacgctgcg 
acttttttaa 
tcaccgttca 
ttgacgactt 
aacgaaatct 
taaacaaaaa 
cctaagagta 



cgtgctttac 
ccagaacaaa 
aggcgatcgt 
ccaaatggat 
tatcgaagca 
ggtggtgtat 
gatgaagcca 
cggcaaactg 
tatggcgaca 
accgggctat 
aagctcgccg 
cgaaagtgcc 
atttggcatc 
tgccgccgga 
gacgtttttt 
cgaccatcgg 
gatccagt tg 
ctgccaccag 
catcgccaaa 
tgtltttttc 
aacgaagcaa 
ttggcaggat 



actcctgaaa 
ggcaaagcgc 
gacaaagtgc 
cgcactggtg 
ggcgatatca 
gccgacatga 
gattcaggtg 
aacgacctta 
t taaact tea 
gtgaataccg 
ctggatgtga 
ggatgtt tgc 
gaggatcttt 
aacataaata 
ctgccccagt 
atcggccatc 
acctgcgacc 
cagcgtt ttg 
attggtttca 
gagtaat t ta 
gcatacgcct 
ggtgagattg 



tcgctgaaaa 
agctggaagt 
gttttgtaca 
ccgactttgc 
gctataaaaa 
ccggtaaaga 
cctacccgca 
aaatcaaagg 
atgccaccgg 
gctttattga 
gtgt ttatga 
atccggcaca 
gccagatcgc 
gtggcaaatt 
gggctaatcc 
tcaactttct 
ggcgtaacgg 
tagacctgat 
gccggatcgt 
actgcgggtg 
gatggcggtc 
agcgacaatc 



ccagcaaatg 
gaaaataggc 
gaccaatatg 
ggtgatgagc 
cgtgctgaaa 
ggtgat tgat 
atttgccaac 
cgaaccggtc 
cggtgatgga 
tgccgaagtg 
accgaaaggt 
atgcttaatc 
ctgccgccag 
cttgtgcggg 
ccccaaccag 
tggcacccag 
ccacggcaag 
ccggat tcaa 
gctcgtaggt 
tcatggtaat 
caaaaaaaag 
gagttacacc 
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